Ben Rosenberg

# Custom Functions

getPop = function(schoolnameV, yearV) {
  n = yearV-2011
  converter = list()
  converter[["Macalester"]] = "Macalester College"
  converter[["HU"]] =  "Hamline University"
  converter[["St. Olaf"]] = "St Olaf College"
  converter[["Gustavus"]] =  "Gustavus Adolphus College"
  converter[["Bethel"]] = "Bethel University"
  converter[["Augsburg"]] =  "Augsburg University"
  converter[["Carleton"]] =  "Carleton College"
  converter[["St. Benedict"]] = "College of Saint Benedict"
  converter[["Concordia"]] = "Concordia University-Saint Paul"
  converter[["St. John"]] = "Saint Johns University"
  converter[["St. Scholastica"]] = "The College of Saint Scholastica"
  converter[["St. Kate"]] ="St Catherine University"
  converter[["St. Mary"]] ="Saint Mary's University of Minnesota"
  
  out = c()
  for (i in 1:length(schoolnameV)) {
    out = c(out, pop[converter[[schoolnameV[i]]]][n[i],])
  }
  
  return(out)
}

thou_to_int = function(x) {
  y = str_replace_all(x, ',', '')
  y = str_replace_all(y, '-', '0')
  y = as.numeric(y)
  return(y)
}
#Loading Data
miac_id = c(174899, 174844, 174817, 174792, 175005, 173902, 173665, 173647, 173328, 174747, 173258, 173160, 173045)

enrollment = read.csv('/Users/blrosenberg/RStudio/DataViz/Hamline Finances/MNEnrollment.csv') %>%
  mutate_at(.vars=vars(-Unit.Id, -Institution.Name), .funs=thou_to_int)
en_miac = enrollment %>% filter(Unit.Id %in% miac_id) %>% select(-Unit.Id) %>% t() %>% data.frame()
rownames(en_miac) = str_replace_all(rownames(en_miac), 'X', '')
colnames(en_miac) = en_miac[1,]
en_miac = en_miac[2:11,]
pop = en_miac

id_name_conv = enrollment %>% filter(Unit.Id %in% miac_id) %>% select(Unit.Id, Institution.Name)

idnum_to_name = function(idnum) {
  return ((id_name_conv %>% filter(Unit.Id==idnum))$Institution.Name)
}

pc = read.csv('/Users/blrosenberg/Coding/Python_Projects/Classes/Oracle/990s/MIAC/PayCombined.csv') %>% 
  mutate(isHU = ifelse(School=="HU", "Hamline", "MIAC (mean)")) %>% mutate(pop = getPop(School, Year))

yrPop = pop %>% mutate(Year = rownames(pop)) %>%
  pivot_longer(cols=-c(Year), names_to="School", values_to="Population") %>% 
  mutate(School = str_replace_all(str_replace_all(School, '\\.s', "'s"), '\\.', ' '))
  
yrPop = yrPop %>% left_join(yrPop %>% group_by(Year) %>% summarize(MIAC_Pop = sum(as.numeric(Population)))) %>%
  mutate(Portion = as.numeric(Population)/MIAC_Pop)

courses = read.csv('/Users/blrosenberg/Coding/Python_Projects/Classes/Oracle/Bulletins/Workday/courses.csv')

programs = read.csv('/Users/blrosenberg/Coding/Python_Projects/Classes/Oracle/Bulletins/programs.csv') %>% mutate_at(.vars=c('cert', 'major', 'minor', 'prep', 'license', 'diploma'), .funs=as.logical) 
retention = read.csv('/Users/blrosenberg/RStudio/DataViz/Hamline Finances/Retention.csv')

for (i in 2012:2022) {
  assign(paste0('tuits', i), read.csv(paste0('/Users/blrosenberg/Coding/Python_Projects/Classes/Oracle/990s/Tuition/ic', i, '_ay.csv')))
}

tuits2012 = tuits2012 %>% mutate(UNITID = as.numeric(rownames(tuits2012)))
tuits_full = list(tuits2012, tuits2013, tuits2014, tuits2015,
             tuits2016, tuits2017, tuits2018, tuits2019,
             tuits2020, tuits2021, tuits2022) %>% reduce(full_join)
  
tuits2012 = tuits2012 %>% filter(UNITID %in% miac_id) %>% mutate(Name=idnum_to_name(UNITID), YR=2012)
tuits2013 = tuits2013 %>% filter(UNITID %in% miac_id) %>% mutate(Name=idnum_to_name(UNITID), YR=2013)
tuits2014 = tuits2014 %>% filter(UNITID %in% miac_id) %>% mutate(Name=idnum_to_name(UNITID), YR=2014)
tuits2015 = tuits2015 %>% filter(UNITID %in% miac_id) %>% mutate(Name=idnum_to_name(UNITID), YR=2015)
tuits2016 = tuits2016 %>% filter(UNITID %in% miac_id) %>% mutate(Name=idnum_to_name(UNITID), YR=2016)
tuits2017 = tuits2017 %>% filter(UNITID %in% miac_id) %>% mutate(Name=idnum_to_name(UNITID), YR=2017)
tuits2018 = tuits2018 %>% filter(UNITID %in% miac_id) %>% mutate(Name=idnum_to_name(UNITID), YR=2018)
tuits2019 = tuits2019 %>% filter(UNITID %in% miac_id) %>% mutate(Name=idnum_to_name(UNITID), YR=2019)
tuits2020 = tuits2020 %>% filter(UNITID %in% miac_id) %>% mutate(Name=idnum_to_name(UNITID), YR=2020)
tuits2021 = tuits2021 %>% filter(UNITID %in% miac_id) %>% mutate(Name=idnum_to_name(UNITID), YR=2021)
tuits2022 = tuits2022 %>% filter(UNITID %in% miac_id) %>% mutate(Name=idnum_to_name(UNITID), YR=2022)

tuits = list(tuits2012, tuits2013, tuits2014, tuits2015,
             tuits2016, tuits2017, tuits2018, tuits2019,
             tuits2020, tuits2021, tuits2022) %>% reduce(full_join)

tuits = tuits %>% mutate(amt = as.numeric(ifelse(TUITION1=="R", XTUIT1, TUITION1))) %>% select(Name, YR, amt) %>% mutate(isHU = ifelse(Name=="Hamline University", "Hamline", "MIAC"), Year=YR)
# Styling

font_add('Avenir', "/Users/blrosenberg/Coding/Python_Projects/Classes/Oracle/fonts/Avenir.ttc", bold="/Users/blrosenberg/Coding/Python_Projects/Classes/Oracle/fonts/AvenirBlack.ttf", italic="/Users/blrosenberg/Coding/Python_Projects/Classes/Oracle/fonts/AvenirLight.ttf")
textsz = 20

xscale = scale_x_continuous(breaks = c(2012:2021), limits=c(2012, 2021))
disc_size = scale_size_discrete(range=c(0.8, 2))
disc_col =scale_color_manual(values = c("#ea5545", "#f46a9b", "#ef9b20", "#edbf33", "#ede15b", "#bdcf32", "#87bc45", "#27aeef", "#b33dc6", "#00ffff", "#000000", "red", "darkgray", "blue"))
hides = guides(linetype="none", size="none")
dollars = scale_y_continuous(labels = scales::label_dollar())
pct = scale_y_continuous(labels = scales::label_percent())
btm = theme(legend.position="bottom")
miac_green = "#0f7754"
hamline_red = "#9d2235"

Introduction + Data Background

As part of my work for the campus newspaper, The Oracle, during President Miller’s retirement, I opted to review some of Hamline’s data to get a fuller, quantitative assessment of the state of the university throughout her eight-year presidency (Fall 2015 – Fall 2023).

The visualizations that follow make use of several queried sets of university population and tuition data from the National Center for Education Statistics’ Integrated Postsecondary Education Data System (IPEDS) in combination with my own custom-scraped datasets derived from a few different sources.

Namely, those are:

Students

Hamline is shrinking. Why it is shrinking is beyond our scope here, but these data do allow us to give more consideration to how severely and for how long the enrollment numbers have been falling. With that context, we are better prepared to assess Miller’s administration’s impact on enrollment. For better or worse, did they make a difference?

A decade ago, Hamline was one of the largest universities in its athletic conference, the Minnesota Intercollegiate Athletic Conference (MIAC). Since then, Hamline’s enrollment numbers have fallen.

Miller’s administration did not produce a noticeable change in the university’s depopulation rate.

Total Student Population over time, Hamline vs. mean in the MIAC

#pdf('PopulationChange.pdf', width=12, height=9)
en_miac %>% mutate(Year = rownames(en_miac)) %>%
  pivot_longer(cols=-c(Year), names_to="School", values_to="Population") %>% 
  mutate(isHU = ifelse(School=="Hamline University", "Hamline", "MIAC (mean)")) %>% 
  group_by(Year, isHU) %>% summarize(Population = mean(as.numeric(Population)), Year=as.numeric(Year[1])) %>%
  ggplot(aes(x=Year, y=Population)) + geom_line(aes(col=isHU), linewidth=4) + labs(col="", y="Total Student Population") +
  geom_vline(xintercept=2015.5, linetype="dashed") +
  geom_text(x=2015.7, y=4400, label="President Miller's First Term", angle=90, family="Avenir", face="italic", size=textsz*0.28) +
  scale_x_continuous(breaks=c(2012:2021), labels=c("'12", "'13", "'14", "'15", "'16", "'17", "'18", "'19", "'20", "'21")) + theme_minimal() +
  guides(col=guide_legend(nrow=2, byrow=T)) +
  theme(axis.text.x = element_text( vjust=1),
        text=element_text(family="Avenir", size=textsz),
        axis.title = element_text(face="bold", size=textsz*1.2),
        axis.title.x = element_text(hjust=0.5, vjust=-4),
        axis.title.y = element_text(hjust=0.5, vjust=1.4),
        plot.title = element_text(face="bold"),
        legend.position = "bottom",
        legend.direction = "vertical",
        legend.justification="right",
        legend.box.margin = margin(-50, 3, 0, 0),
        legend.text = element_text(size=textsz*0.95),
        legend.spacing.y = unit(20, "pt")
        ) + 
  scale_color_manual(values=c(hamline_red, miac_green))

#dev.off()

While Hamline’s enrollment fell steadily, enrollment numbers stayed relatively stable throughout the rest of the MIAC. As a result, the portion of students in the MIAC who attended Hamline also reliably decreased year after year.

The Shrinking Portion of MIAC Students Attending Hamline Since 2012

schoolCols = c("#666666", "#0069aa", "#0b5091", "#be0f34", "#E6B220", "#FFF", hamline_red, 
               "#D44420", "#000", "#E22739", "#4F2682", "#53585a", "#00447c")
schoolCols2 = c("#660033","#B09247","#FFD24F", "#000", "#003055","#FCCB06", "#888C8D", 
                "#01426A", "#FFFFFE", "#0C2F59", "#FFE153", "#242121", "#FFCB00")

aval <- list()
for(step in 1:10) {
  yr = step+2011
  aval[[step]] <-list(visible = FALSE,
                      name = paste0('Year = ', yr),
                      label = yr,
                      x=(yrPop %>% filter(Year==yr) %>% arrange(School))$School,
                      y=(yrPop %>% filter(Year==yr) %>% arrange(School))$Population,
                      text=(yrPop %>% filter(Year==yr) %>% arrange(School))$Portion)
}
aval[3][[1]]$visible = T

steps <- list()
fig <- plot_ly(sort=F)
for (i in 1:10) {
  yr = i+2011
  fig = fig %>% add_pie(labels=aval[i][[1]]$x, 
                        values=aval[i][[1]]$y,
                        #text=aval[i][[1]]$x,
                        visible = aval[i][[1]]$visible, 
                        marker = list(colors=schoolCols, line=list(color=schoolCols2, width=2)),
                        pull = 0.03,
                        name = '',#aval[i][[1]]$name, 
                        type = 'pie', 
                        hoverinfo = 'text',
                        hovertext = paste(
                          aval[i][[1]]$x, '\n', 
                          scales::percent(aval[i][[1]]$text, accuracy=0.01), 'of the MIAC\n', 
                          aval[i][[1]]$y, "Students"
                        ))

  step <- list(args = list('visible', rep(FALSE, length(aval))),
               method = 'restyle', label=yr)
  step$args[[2]][[i]] = TRUE  
  steps[[i]] = step 
} 

fig <- fig %>%
  layout(sliders = list(list(active = 0,
                             currentvalue = list(prefix = "Year: "),
                             steps = steps)))

fig

Like emigration from a country, the size of the student population at Hamline should be understood as complicated and affected subtly by many factors: some positive and some negative. Those factors include, but are not limited to, the number of applications, acceptance rate, enrollment rate (among those who have been admitted), transfers-in, transfers-out, and withdrawal rates. Put more simply: how many are coming in, how many are coming back, and how many are leaving?

Universities use a fairly strictly-defined metric, retention, to quantify the “How many are coming back?” portion of that equation. Rather than more generally tracking the portion of students in a given semester who also attended the same school in the previous semester, the National Center for Education Statistics specifically tracks the portion of a university’s first-time students in the fall semester of their first year (that year’s “cohort”) who return in subsequent semesters.3

Looking at Hamline’s officially reported retention rates since 2006, we can see a distinct change: long-term retention has fallen, and the size of the cohort has grown. Most notably, the cohort size grew by 35% from 2009 to 2012 while the four-year retention rate fell from 58% to 54.3% over that same period. Though that change precedes Miller’s term, the trend continued throughout the available data.

Change in Student Retention at Hamline, 2006-2019

p_to_n = function(period) {
  converter = list()
  converter["Fall1"] = 1
  converter["Fall2"] = 3
  converter["Fall3"] = 5
  converter["Fall4"] = 7
  converter["Spring1"] = 2
  converter["Spring2"] = 4
  converter["Spring3"] = 6
  converter["Spring4"] = 8
  out = c()
  for (i in period) {
    out = c(out, converter[[i]])
  }
  return(out)
}

ret2 = retention %>% mutate_all(.funs=as.numeric) %>% rename(Fall1N = Cohort) %>% 
  pivot_longer(cols=-c(Year), names_to="Period", values_to="Retained") %>% 
  mutate(isPct = !str_ends(Period, "N"), pct = Retained*isPct, Period = str_replace_all(Period, "N", ""), o=p_to_n(Period)) %>%
  group_by(Year, o) %>% summarize(pct=max(pct), ct=max(Retained))  %>% mutate(pct=ifelse(pct==0, 1, pct))

gg = ret2 %>% filter(Year==2006) %>%
  ggplot(aes(x=o, y=ct)) + geom_bar(aes(alpha=pct), stat="identity", fill=hamline_red) + coord_flip() +
  theme_minimal() + 
  scale_alpha_continuous(range=c(0.7, 1)) +
  scale_x_continuous(breaks=(1:8), 
                                       labels=c("1st Fall", "1st Spring",
                                                "2nd Fall", "2nd Spring",
                                                "3rd Fall", "3rd Spring",
                                                "4th Fall", "4th Spring")) + 
  labs(y="Full-Time Students Retained", x="Semesters at Hamline", title="Rention at Hamline") + 
  theme(plot.title=element_text(hjust=0.5)) + guides(alpha="none")

aval <- list()
for(step in 1:14) {
  yr = step+2005
  aval[[step]] <-list(visible = FALSE,
                      name = paste0('Year = ', yr),
                      label = yr,
                      pd=c("1st Fall Semester", "1st Spring Semester",
                            "2nd Fall Semester", "2nd Spring Semester",
                            "3rd Fall Semester", "3rd Spring Semester",
                            "4th Fall Semester", "4th Spring Semester"),
                      x=1:8,
                      y=(ret2 %>% filter(Year==yr))$ct,
                      alpha=(ret2 %>% filter(Year==yr))$pct)
}
aval[1][[1]]$visible = T

steps <- list()
fig <- plot_ly()
for (i in 1:14) {
  yr = i+2005
  fig = fig %>% add_bars(y=aval[i][[1]]$pd, x=aval[i][[1]]$y, 
                         text=scales::percent(aval[i][[1]]$alpha),
                         #opacity = aval[i][[1]]$alpha, 
                         marker = list(color=hamline_red, opacity = aval[i][[1]]$alpha/2+0.5),
                         visible = aval[i][[1]]$visible, 
                         name = '', 
                         type = 'bar', 
                         hoverinfo = 'text',
                         hovertext = paste(aval[i][[1]]$y, "students"),
                         orientation= 'h', showlegend=F)

  step <- list(args = list('visible', rep(FALSE, length(aval))),
               method = 'restyle', label=yr)
  step$args[[2]][[i]] = TRUE  
  steps[[i]] = step 
} 


fig = fig %>%
  layout(sliders = list(list(active = 0,
                             currentvalue = list(prefix = "Year: "),
                             steps = steps,
                             pad = list(t=60))),
                    xaxis = list(title="Full-Time Students Retained from First-Year Cohort", range=c(0, 600)),
         margin = list(pad=10)
) 

fig

Academic Programs

Anecdotally, my conversations with Hamline professors about Miller’s administration have tended toward airing out frustrations with several years of “rightsizing” and “program review” which aimed to reduce expenses by removing or restricting academic programs with limited attendance or limited financial returns. While their complaints are often qualitative—including a sense of job insecurity and interdepartmental tension over their shared, scant resources—we will proceed with one coarse approach for quantifying this upheaval.

I gathered data from the University’s bulletins to tabulate the Academic Programs offered for each of the past 14 years. By comparing each year to the previous year, we can see how many programs were added and how many were removed.

There are important limits to these data which should be considered: the comparison between years relies entirely on the literal names of the programs offered. If a “Bachelor of Arts in Public Health” is relabeled as a “Bachelor of Arts (BA) in Public Health” the next year, that is counted as both 1 program lost and 1 program gained. Still, an imbalance of program changes signifies a true loss or gain of a program, and many name changes do reflect a real, substantive change to the program.

Since Miller’s term began, we can see a clear, new trend of growing upheaval in the programs offered at Hamline.

Yearly change in the number of academic programs at Hamline since 2009

programs %>% select(-c(cert, major, minor, prep, license, diploma)) %>% 
  left_join(programs %>% group_by(name) %>% summarize(s = min(yr), e=max(yr))) %>% 
  group_by(name) %>% summarize(Started=s[1], Ended=e[1]) %>%
  mutate(fm=Started>2014) %>%
  pivot_longer(cols=c(Started, Ended), names_to = "type", values_to = "dt") %>%
  filter(dt > 2008, dt<2023) %>%
  group_by(dt, type) %>% summarize(amt=length(dt)) %>%
  mutate(amt = ifelse(type=="Ended", -amt, amt), 
         type = factor(type, levels=c("Started", "Ended"), labels=c("Programs Started", "Programs Ended"))) %>%
  ggplot(aes(x=dt, y=amt, fill=type)) + geom_bar(stat='identity') + 
  geom_vline(xintercept=2015.5, linetype="dashed") +
  geom_text(x=2015.7, y=-38, label="President Miller's First Term", angle=90, family="Avenir", face="italic", size=textsz*0.28) +
  scale_x_continuous(breaks=c(2009:2022), labels=c("'09", "'10", "'11", "'12", "'13", "'14", "'15", "'16", "'17", "'18", "'19", "'20", "'21", "'22")) +
  labs(x="Year", y="Change in the number of academic programs", fill="") + theme_minimal() + 
  guides(fill=guide_legend(nrow=2, byrow=T)) +
  theme(axis.text.x = element_text( vjust=1),
        text=element_text(family="Avenir", size=textsz),
        axis.title = element_text(face="bold", size=textsz*1.2),
        axis.title.x = element_text(hjust=0.5, vjust=-4),
        axis.title.y = element_text(hjust=1.5, vjust=1.4),
        plot.title = element_text(face="bold"),
        legend.position = "bottom",
        legend.direction = "vertical",
        legend.justification="right",
        legend.box.margin = margin(-50, 3, 0, 0),
        legend.text = element_text(size=textsz*0.95),
        legend.spacing.y = unit(20, "pt")
        ) + 
  scale_fill_manual(values=c("darkgray", hamline_red))

Finances

Lastly, I explored Hamline’s finances since 2012.

Despite the reliable frustration in response to Hamline’s annual tuition increase announcement, nearly every university raises its tuition year after year. Still, the university’s financial stability has been a major concern since before Miller’s presidency, and with a sizable budget deficit looming over campus, this Miller’s final year looks no different.

When I interviewed President Miller on Nov. 30, 2023, she confirmed that the annual tuition change is part of Hamline being a “tuition-funded University” affected by inflation and declining enrollment and that she had prioritized growing the school’s endowment throughout her term.

The financial reports of private, non-profit universities like Hamline are public4. This form includes an itemized list of major expenses which are totaled into a single “Total Expenses” field. When that number is divided by the university’s reported enrollment, we arrive at an approximated Expenses Per Student which might reasonably be expected to correlate with what the university charges for tuition. In the MIAC at large, it does. At Hamline, despite declining enrollment numbers, the reported Expenses Per Student fell from more than $40k to less than $25k while tuition steadily climbed past $40k. Where is all that money going?

Reported Expenses Per Student vs Tuition

p1 = pc %>% select(School, TotalExpenses, Year) %>% 
  group_by(School, Year) %>% filter(Year < 2021) %>% summarize(School=School[1], Year=Year[1], TotalExpenses=TotalExpenses[1]) %>% 
  mutate(Pop = as.numeric(getPop(School, Year)), 
         ExpensePerStudent=TotalExpenses/Pop, 
         isHU = ifelse(School=="HU", "Hamline", "MIAC")) %>% 
  group_by(isHU, Year) %>% summarize(ExpensePerStudent = mean(ExpensePerStudent)) %>% left_join(tuits %>% filter(isHU=="Hamline")) %>%
  filter(isHU=="Hamline") %>%
  ggplot(aes(x=Year, y=ExpensePerStudent)) + scale_x_continuous(breaks=2012:2020) +
  geom_area(aes(y=amt), linetype="dashed", linewidth=4, fill="#9d2235") + 
  theme_minimal() + 
  geom_area(linewidth=4, fill="darkgray", alpha=0.8) +
  scale_y_continuous(labels = scales::label_dollar(), limits=c(0, 50000)) +
  geom_text(x=2016, y=10000, label="Total university expenses per student", family="Avenir", size=textsz*0.25) +
  geom_text(x=2018, y=35000, label="Hamline university in-state tuition", col="white", family="Avenir", size=textsz*0.25) + 
  labs(y="Cost of tuition and cost of university expenses (USD)\n", x="\nYear", title="Tuition vs. university expenses per student at Hamline University") + 
  theme(plot.title = element_text(hjust=0.5, face="bold"),
        axis.title = element_text(face="bold"),
        text = element_text(family="Avenir", size=textsz*0.6))

p2 = pc %>% select(School, TotalExpenses, Year) %>% 
  group_by(School, Year) %>% filter(Year < 2021) %>% summarize(School=School[1], Year=Year[1], TotalExpenses=TotalExpenses[1]) %>% 
  mutate(Pop = as.numeric(getPop(School, Year)), 
         ExpensePerStudent=TotalExpenses/Pop, 
         isHU = ifelse(School=="HU", "Hamline", "MIAC")) %>% 
  group_by(isHU, Year) %>% summarize(ExpensePerStudent = mean(ExpensePerStudent)) %>% left_join(tuits %>% mutate(isHU!="Hamline")) %>%
  group_by(isHU, Year) %>% summarize(ExpensePerStudent = mean(ExpensePerStudent), amt=mean(amt)) %>%
  filter(isHU!="Hamline") %>%
  ggplot(aes(x=Year, y=ExpensePerStudent)) + scale_x_continuous(breaks=2012:2020) +
  theme_minimal() + 
  geom_area(linewidth=4, fill="darkgray", alpha=0.8) +
  geom_area(aes(y=amt), linetype="dashed", linewidth=4, fill="#0f7754") + 
  scale_y_continuous(labels = scales::label_dollar(), limits=c(0, 50000)) +
  geom_text(x=2014.6, y=41000, label="Mean total university expenses per student", family="Avenir", size=textsz*0.25) +
  geom_text(x=2016, y=20000, label="MIAC mean in-state tuition", col="white", family="Avenir", size=textsz*0.25) + 
  labs(y="Cost of tuition and cost of university expenses (USD)\n", x="\nYear", title="Tuition vs. university expenses per student in the MIAC") + 
  theme(plot.title = element_text(hjust=0.5, face="bold"),
        axis.title = element_text(face="bold"),
        text = element_text(family="Avenir", size=textsz*0.6))


grid.arrange(p1, p2, ncol=2)

The MIAC schools vary significantly, and that in turn limits the meaning of any direct comparison of the dollar amount of administrative salaries at different schools. However, Form 990 also includes a report of all compensation paid to university employees. By instead comparing the portion of all university compensation that is paid to the university president, we can see that Hamline’s presidential portion has grown sizably since the start of Miller’s presidency, not only in excess of the MIAC average but in complete opposition to the average decrease seen during the COVID-19 pandemic.

Change in the Presidential Portion of All Compensation, Hamline vs. Mean in the MIAC

#pdf('PresPayChange.pdf', width=12, height=9)

pc %>% filter(Title %in% c("PRESIDENT", "President"), !(School %in% c("St. Mary", "St. Kate"))) %>% 
  mutate(CompRate = ReportableCompFromOrg/(OfficerPay + OtherSalaries)) %>% 
  group_by(isHU, Year) %>% summarize(CompRate = mean(CompRate)) %>% arrange(Year) %>%
  ggplot(aes(x=Year, y=CompRate)) + geom_line(aes(color=isHU), linewidth=5) + pct +
  theme_minimal() + labs(col="", y = "Presidential portion of all university compensation") +
  geom_vline(xintercept=2015, linetype="dashed") +
  geom_text(aes(x=-900), x=2015.2, y=0.015, label="President Miller's First Term", angle=90, family="Avenir",
            size=textsz*0.28) +
  scale_x_continuous(breaks=c(2012:2021), 
                     labels=c("'12", "'13", "'14", "'15", "'16", "'17", "'18", "'19", "'20", "'21"), 
                     limits=c(2012, 2021)) +
  guides(col=guide_legend(nrow=2, byrow=T), label = F, text = F, col=F) +
  theme(axis.text.x = element_text( vjust=1),
        text=element_text(family="Avenir", size=textsz),
        axis.title = element_text(face="bold", size=textsz*1.2),
        axis.title.x = element_text(hjust=0.5, vjust=-4),
        axis.title.y = element_text(hjust=1, vjust=1.4),
        plot.title = element_text(face="bold"),
        legend.position = "bottom",
        legend.direction = "vertical",
        legend.justification="right",
        legend.box.margin = margin(-50, 3, 0, 0),
        legend.text = element_text(size=textsz*0.95),
        legend.spacing.y = unit(20, "pt")
        ) + 
  scale_color_manual(values=c(hamline_red, miac_green))

#dev.off()

Notes


  1. I used Python to manually wrangle some of the XML into a dataframe saved as a CSV.↩︎

  2. I used the Python package BeautifulSoup to scrape previous years’ course listing pages↩︎

  3. Wherever an individual retention figure is reported for a university, it generally refers to the portion of the previous year’s cohort who returned for the fall semester of their second year.↩︎

  4. Though there is often a lengthy (multi-year) delay between a year’s tax season and public access to the 990 form.↩︎

---
title: "The State of Hamline University"
author: "Ben Rosenberg"
date: "`r Sys.Date()`"
output: 
  openintro::lab_report:
    code_folding: hide
    theme: journal

---

```{r load-packages, message=FALSE, echo=F, results=F}
library(tidyverse)
library(plotly)
library(showtext)
library(shiny)
library(purrr)
library(gridExtra)

showtext_auto()


#knitr::opts_chunk$set(echo = F, warning=F, message=F, fig.width=8)
knitr::opts_chunk$set(echo = T, warning=F, message=F, fig.width=8)

rm(list = ls())
```

```{r}
# Custom Functions

getPop = function(schoolnameV, yearV) {
  n = yearV-2011
  converter = list()
  converter[["Macalester"]] = "Macalester College"
  converter[["HU"]] =  "Hamline University"
  converter[["St. Olaf"]] = "St Olaf College"
  converter[["Gustavus"]] =  "Gustavus Adolphus College"
  converter[["Bethel"]] = "Bethel University"
  converter[["Augsburg"]] =  "Augsburg University"
  converter[["Carleton"]] =  "Carleton College"
  converter[["St. Benedict"]] = "College of Saint Benedict"
  converter[["Concordia"]] = "Concordia University-Saint Paul"
  converter[["St. John"]] = "Saint Johns University"
  converter[["St. Scholastica"]] = "The College of Saint Scholastica"
  converter[["St. Kate"]] ="St Catherine University"
  converter[["St. Mary"]] ="Saint Mary's University of Minnesota"
  
  out = c()
  for (i in 1:length(schoolnameV)) {
    out = c(out, pop[converter[[schoolnameV[i]]]][n[i],])
  }
  
  return(out)
}

thou_to_int = function(x) {
  y = str_replace_all(x, ',', '')
  y = str_replace_all(y, '-', '0')
  y = as.numeric(y)
  return(y)
}

```

```{r message=F}
#Loading Data
miac_id = c(174899, 174844, 174817, 174792, 175005, 173902, 173665, 173647, 173328, 174747, 173258, 173160, 173045)

enrollment = read.csv('/Users/blrosenberg/RStudio/DataViz/Hamline Finances/MNEnrollment.csv') %>%
  mutate_at(.vars=vars(-Unit.Id, -Institution.Name), .funs=thou_to_int)
en_miac = enrollment %>% filter(Unit.Id %in% miac_id) %>% select(-Unit.Id) %>% t() %>% data.frame()
rownames(en_miac) = str_replace_all(rownames(en_miac), 'X', '')
colnames(en_miac) = en_miac[1,]
en_miac = en_miac[2:11,]
pop = en_miac

id_name_conv = enrollment %>% filter(Unit.Id %in% miac_id) %>% select(Unit.Id, Institution.Name)

idnum_to_name = function(idnum) {
  return ((id_name_conv %>% filter(Unit.Id==idnum))$Institution.Name)
}

pc = read.csv('/Users/blrosenberg/Coding/Python_Projects/Classes/Oracle/990s/MIAC/PayCombined.csv') %>% 
  mutate(isHU = ifelse(School=="HU", "Hamline", "MIAC (mean)")) %>% mutate(pop = getPop(School, Year))

yrPop = pop %>% mutate(Year = rownames(pop)) %>%
  pivot_longer(cols=-c(Year), names_to="School", values_to="Population") %>% 
  mutate(School = str_replace_all(str_replace_all(School, '\\.s', "'s"), '\\.', ' '))
  
yrPop = yrPop %>% left_join(yrPop %>% group_by(Year) %>% summarize(MIAC_Pop = sum(as.numeric(Population)))) %>%
  mutate(Portion = as.numeric(Population)/MIAC_Pop)

courses = read.csv('/Users/blrosenberg/Coding/Python_Projects/Classes/Oracle/Bulletins/Workday/courses.csv')

programs = read.csv('/Users/blrosenberg/Coding/Python_Projects/Classes/Oracle/Bulletins/programs.csv') %>% mutate_at(.vars=c('cert', 'major', 'minor', 'prep', 'license', 'diploma'), .funs=as.logical) 
retention = read.csv('/Users/blrosenberg/RStudio/DataViz/Hamline Finances/Retention.csv')

for (i in 2012:2022) {
  assign(paste0('tuits', i), read.csv(paste0('/Users/blrosenberg/Coding/Python_Projects/Classes/Oracle/990s/Tuition/ic', i, '_ay.csv')))
}

tuits2012 = tuits2012 %>% mutate(UNITID = as.numeric(rownames(tuits2012)))
tuits_full = list(tuits2012, tuits2013, tuits2014, tuits2015,
             tuits2016, tuits2017, tuits2018, tuits2019,
             tuits2020, tuits2021, tuits2022) %>% reduce(full_join)
  
tuits2012 = tuits2012 %>% filter(UNITID %in% miac_id) %>% mutate(Name=idnum_to_name(UNITID), YR=2012)
tuits2013 = tuits2013 %>% filter(UNITID %in% miac_id) %>% mutate(Name=idnum_to_name(UNITID), YR=2013)
tuits2014 = tuits2014 %>% filter(UNITID %in% miac_id) %>% mutate(Name=idnum_to_name(UNITID), YR=2014)
tuits2015 = tuits2015 %>% filter(UNITID %in% miac_id) %>% mutate(Name=idnum_to_name(UNITID), YR=2015)
tuits2016 = tuits2016 %>% filter(UNITID %in% miac_id) %>% mutate(Name=idnum_to_name(UNITID), YR=2016)
tuits2017 = tuits2017 %>% filter(UNITID %in% miac_id) %>% mutate(Name=idnum_to_name(UNITID), YR=2017)
tuits2018 = tuits2018 %>% filter(UNITID %in% miac_id) %>% mutate(Name=idnum_to_name(UNITID), YR=2018)
tuits2019 = tuits2019 %>% filter(UNITID %in% miac_id) %>% mutate(Name=idnum_to_name(UNITID), YR=2019)
tuits2020 = tuits2020 %>% filter(UNITID %in% miac_id) %>% mutate(Name=idnum_to_name(UNITID), YR=2020)
tuits2021 = tuits2021 %>% filter(UNITID %in% miac_id) %>% mutate(Name=idnum_to_name(UNITID), YR=2021)
tuits2022 = tuits2022 %>% filter(UNITID %in% miac_id) %>% mutate(Name=idnum_to_name(UNITID), YR=2022)

tuits = list(tuits2012, tuits2013, tuits2014, tuits2015,
             tuits2016, tuits2017, tuits2018, tuits2019,
             tuits2020, tuits2021, tuits2022) %>% reduce(full_join)

tuits = tuits %>% mutate(amt = as.numeric(ifelse(TUITION1=="R", XTUIT1, TUITION1))) %>% select(Name, YR, amt) %>% mutate(isHU = ifelse(Name=="Hamline University", "Hamline", "MIAC"), Year=YR)
```

```{r warning=F}
# Styling

font_add('Avenir', "/Users/blrosenberg/Coding/Python_Projects/Classes/Oracle/fonts/Avenir.ttc", bold="/Users/blrosenberg/Coding/Python_Projects/Classes/Oracle/fonts/AvenirBlack.ttf", italic="/Users/blrosenberg/Coding/Python_Projects/Classes/Oracle/fonts/AvenirLight.ttf")
textsz = 20

xscale = scale_x_continuous(breaks = c(2012:2021), limits=c(2012, 2021))
disc_size = scale_size_discrete(range=c(0.8, 2))
disc_col =scale_color_manual(values = c("#ea5545", "#f46a9b", "#ef9b20", "#edbf33", "#ede15b", "#bdcf32", "#87bc45", "#27aeef", "#b33dc6", "#00ffff", "#000000", "red", "darkgray", "blue"))
hides = guides(linetype="none", size="none")
dollars = scale_y_continuous(labels = scales::label_dollar())
pct = scale_y_continuous(labels = scales::label_percent())
btm = theme(legend.position="bottom")
miac_green = "#0f7754"
hamline_red = "#9d2235"
```

# Introduction + Data Background

As part of my work for the campus newspaper, *The Oracle*, during President Miller's retirement, I opted to review some of Hamline's data to get a fuller, quantitative assessment of the state of the university throughout her eight-year presidency (Fall 2015 -- Fall 2023).

The visualizations that follow make use of several queried sets of [university population and tuition data from the National Center for Education Statistics' Integrated Postsecondary Education Data System (IPEDS)](https://nces.ed.gov/ipeds/datacenter/InstitutionList.aspx?stepId=1&viewinstitutions=view&sid=c6a89095-9a15-44e9-9369-d9ec5dc0bf73&rtid=1) in combination with my own custom-scraped datasets derived from a few different sources.

Namely, those are:

* XML formatted [990 forms provided by ProPublica](https://projects.propublica.org/nonprofits/organizations/410693960) ^[I used Python to manually wrangle some of the XML into a dataframe saved as a CSV.]
* Hamline's registration platform, Workday. ^[I used the Python package BeautifulSoup to scrape previous years' course listing pages]
* [Hamline's previously posted bulletins](http://bulletin.hamline.edu/content.php?catoid=32&navoid=1564)

# Students

Hamline is shrinking. *Why* it is shrinking is beyond our scope here, but these data do allow us to give more consideration to *how severely* and *for how long* the enrollment numbers have been falling. With that context, we are better prepared to assess Miller's administration's impact on enrollment. For better or worse, did they make a difference? 

A decade ago, Hamline was one of the largest universities in its athletic conference, the Minnesota Intercollegiate Athletic Conference (MIAC). Since then, Hamline's enrollment numbers have fallen. 

Miller's administration did not produce a noticeable change in the university's depopulation rate.

## Total Student Population over time, Hamline vs. mean in the MIAC


```{r fig.width=12, fig.height=9, message=F, warning=F}
#pdf('PopulationChange.pdf', width=12, height=9)
en_miac %>% mutate(Year = rownames(en_miac)) %>%
  pivot_longer(cols=-c(Year), names_to="School", values_to="Population") %>% 
  mutate(isHU = ifelse(School=="Hamline University", "Hamline", "MIAC (mean)")) %>% 
  group_by(Year, isHU) %>% summarize(Population = mean(as.numeric(Population)), Year=as.numeric(Year[1])) %>%
  ggplot(aes(x=Year, y=Population)) + geom_line(aes(col=isHU), linewidth=4) + labs(col="", y="Total Student Population") +
  geom_vline(xintercept=2015.5, linetype="dashed") +
  geom_text(x=2015.7, y=4400, label="President Miller's First Term", angle=90, family="Avenir", face="italic", size=textsz*0.28) +
  scale_x_continuous(breaks=c(2012:2021), labels=c("'12", "'13", "'14", "'15", "'16", "'17", "'18", "'19", "'20", "'21")) + theme_minimal() +
  guides(col=guide_legend(nrow=2, byrow=T)) +
  theme(axis.text.x = element_text( vjust=1),
        text=element_text(family="Avenir", size=textsz),
        axis.title = element_text(face="bold", size=textsz*1.2),
        axis.title.x = element_text(hjust=0.5, vjust=-4),
        axis.title.y = element_text(hjust=0.5, vjust=1.4),
        plot.title = element_text(face="bold"),
        legend.position = "bottom",
        legend.direction = "vertical",
        legend.justification="right",
        legend.box.margin = margin(-50, 3, 0, 0),
        legend.text = element_text(size=textsz*0.95),
        legend.spacing.y = unit(20, "pt")
        ) + 
  scale_color_manual(values=c(hamline_red, miac_green))
#dev.off()
```

\hfill \break
\hfill \break

While Hamline's enrollment fell steadily, enrollment numbers stayed relatively stable throughout the rest of the MIAC. As a result, the portion of students in the MIAC who attended Hamline also reliably decreased year after year.

\hfill \break
\hfill \break


## The Shrinking Portion of MIAC Students Attending Hamline Since 2012

```{r}

schoolCols = c("#666666", "#0069aa", "#0b5091", "#be0f34", "#E6B220", "#FFF", hamline_red, 
               "#D44420", "#000", "#E22739", "#4F2682", "#53585a", "#00447c")
schoolCols2 = c("#660033","#B09247","#FFD24F", "#000", "#003055","#FCCB06", "#888C8D", 
                "#01426A", "#FFFFFE", "#0C2F59", "#FFE153", "#242121", "#FFCB00")

aval <- list()
for(step in 1:10) {
  yr = step+2011
  aval[[step]] <-list(visible = FALSE,
                      name = paste0('Year = ', yr),
                      label = yr,
                      x=(yrPop %>% filter(Year==yr) %>% arrange(School))$School,
                      y=(yrPop %>% filter(Year==yr) %>% arrange(School))$Population,
                      text=(yrPop %>% filter(Year==yr) %>% arrange(School))$Portion)
}
aval[3][[1]]$visible = T

steps <- list()
fig <- plot_ly(sort=F)
for (i in 1:10) {
  yr = i+2011
  fig = fig %>% add_pie(labels=aval[i][[1]]$x, 
                        values=aval[i][[1]]$y,
                        #text=aval[i][[1]]$x,
                        visible = aval[i][[1]]$visible, 
                        marker = list(colors=schoolCols, line=list(color=schoolCols2, width=2)),
                        pull = 0.03,
                        name = '',#aval[i][[1]]$name, 
                        type = 'pie', 
                        hoverinfo = 'text',
                        hovertext = paste(
                          aval[i][[1]]$x, '\n', 
                          scales::percent(aval[i][[1]]$text, accuracy=0.01), 'of the MIAC\n', 
                          aval[i][[1]]$y, "Students"
                        ))

  step <- list(args = list('visible', rep(FALSE, length(aval))),
               method = 'restyle', label=yr)
  step$args[[2]][[i]] = TRUE  
  steps[[i]] = step 
} 

fig <- fig %>%
  layout(sliders = list(list(active = 0,
                             currentvalue = list(prefix = "Year: "),
                             steps = steps)))

fig
```

Like emigration from a country, the size of the student population at Hamline should be understood as complicated and affected subtly by many factors: some positive and some negative. Those factors include, but are not limited to, the number of applications, acceptance rate, enrollment rate (among those who have been admitted), transfers-in, transfers-out, and withdrawal rates. Put more simply: how many are coming in, how many are coming back, and how many are leaving?

Universities use a fairly strictly-defined metric, *retention*, to quantify the "How many are coming back?" portion of that equation. Rather than more generally tracking the portion of students in a given semester who also attended the same school in the previous semester, the National Center for Education Statistics specifically tracks the portion of a university's first-time students in the fall semester of their first year (that year's "cohort") who return in subsequent semesters.^[Wherever an individual *retention* figure is reported for a university, it generally refers to the portion of the previous year's cohort who returned for the fall semester of their second year.]

Looking at Hamline's officially reported retention rates since 2006, we can see a distinct change: long-term retention has fallen, and the size of the cohort has grown. Most notably, the cohort size grew by *35%* from 2009 to 2012 while the four-year retention rate fell from 58% to 54.3% over that same period. Though that change precedes Miller's term, the trend continued throughout the available data.

## Change in Student Retention at Hamline, 2006-2019

```{r message=F, warning=F}
p_to_n = function(period) {
  converter = list()
  converter["Fall1"] = 1
  converter["Fall2"] = 3
  converter["Fall3"] = 5
  converter["Fall4"] = 7
  converter["Spring1"] = 2
  converter["Spring2"] = 4
  converter["Spring3"] = 6
  converter["Spring4"] = 8
  out = c()
  for (i in period) {
    out = c(out, converter[[i]])
  }
  return(out)
}

ret2 = retention %>% mutate_all(.funs=as.numeric) %>% rename(Fall1N = Cohort) %>% 
  pivot_longer(cols=-c(Year), names_to="Period", values_to="Retained") %>% 
  mutate(isPct = !str_ends(Period, "N"), pct = Retained*isPct, Period = str_replace_all(Period, "N", ""), o=p_to_n(Period)) %>%
  group_by(Year, o) %>% summarize(pct=max(pct), ct=max(Retained))  %>% mutate(pct=ifelse(pct==0, 1, pct))

gg = ret2 %>% filter(Year==2006) %>%
  ggplot(aes(x=o, y=ct)) + geom_bar(aes(alpha=pct), stat="identity", fill=hamline_red) + coord_flip() +
  theme_minimal() + 
  scale_alpha_continuous(range=c(0.7, 1)) +
  scale_x_continuous(breaks=(1:8), 
                                       labels=c("1st Fall", "1st Spring",
                                                "2nd Fall", "2nd Spring",
                                                "3rd Fall", "3rd Spring",
                                                "4th Fall", "4th Spring")) + 
  labs(y="Full-Time Students Retained", x="Semesters at Hamline", title="Rention at Hamline") + 
  theme(plot.title=element_text(hjust=0.5)) + guides(alpha="none")

aval <- list()
for(step in 1:14) {
  yr = step+2005
  aval[[step]] <-list(visible = FALSE,
                      name = paste0('Year = ', yr),
                      label = yr,
                      pd=c("1st Fall Semester", "1st Spring Semester",
                            "2nd Fall Semester", "2nd Spring Semester",
                            "3rd Fall Semester", "3rd Spring Semester",
                            "4th Fall Semester", "4th Spring Semester"),
                      x=1:8,
                      y=(ret2 %>% filter(Year==yr))$ct,
                      alpha=(ret2 %>% filter(Year==yr))$pct)
}
aval[1][[1]]$visible = T

steps <- list()
fig <- plot_ly()
for (i in 1:14) {
  yr = i+2005
  fig = fig %>% add_bars(y=aval[i][[1]]$pd, x=aval[i][[1]]$y, 
                         text=scales::percent(aval[i][[1]]$alpha),
                         #opacity = aval[i][[1]]$alpha, 
                         marker = list(color=hamline_red, opacity = aval[i][[1]]$alpha/2+0.5),
                         visible = aval[i][[1]]$visible, 
                         name = '', 
                         type = 'bar', 
                         hoverinfo = 'text',
                         hovertext = paste(aval[i][[1]]$y, "students"),
                         orientation= 'h', showlegend=F)

  step <- list(args = list('visible', rep(FALSE, length(aval))),
               method = 'restyle', label=yr)
  step$args[[2]][[i]] = TRUE  
  steps[[i]] = step 
} 


fig = fig %>%
  layout(sliders = list(list(active = 0,
                             currentvalue = list(prefix = "Year: "),
                             steps = steps,
                             pad = list(t=60))),
                    xaxis = list(title="Full-Time Students Retained from First-Year Cohort", range=c(0, 600)),
         margin = list(pad=10)
) 

fig


```

# Academic Programs

Anecdotally, my conversations with Hamline professors about Miller's administration have tended toward airing out frustrations with several years of "rightsizing" and "program review" which aimed to reduce expenses by removing or restricting academic programs with limited attendance or limited financial returns. While their complaints are often qualitative---including a sense of job insecurity and interdepartmental tension over their shared, scant resources---we will proceed with one coarse approach for quantifying this upheaval.

I gathered data from the University's bulletins to tabulate the Academic Programs offered for each of the past 14 years. By comparing each year to the previous year, we can see how many programs were *added* and how many were *removed*.

There are important limits to these data which should be considered: the comparison between years relies entirely on the literal names of the programs offered. If a "Bachelor of Arts in Public Health" is relabeled as a "Bachelor of Arts (BA) in Public Health" the next year, that is counted as both 1 program lost and 1 program gained. Still, an imbalance of program changes signifies a true loss or gain of a program, and many name changes *do* reflect a real, substantive change to the program. 

Since Miller's term began, we can see a clear, new trend of growing upheaval in the programs offered at Hamline.

## Yearly change in the number of academic programs at Hamline since 2009

```{r message=F, warning=F, fig.width=15, fig.height=8.8}

programs %>% select(-c(cert, major, minor, prep, license, diploma)) %>% 
  left_join(programs %>% group_by(name) %>% summarize(s = min(yr), e=max(yr))) %>% 
  group_by(name) %>% summarize(Started=s[1], Ended=e[1]) %>%
  mutate(fm=Started>2014) %>%
  pivot_longer(cols=c(Started, Ended), names_to = "type", values_to = "dt") %>%
  filter(dt > 2008, dt<2023) %>%
  group_by(dt, type) %>% summarize(amt=length(dt)) %>%
  mutate(amt = ifelse(type=="Ended", -amt, amt), 
         type = factor(type, levels=c("Started", "Ended"), labels=c("Programs Started", "Programs Ended"))) %>%
  ggplot(aes(x=dt, y=amt, fill=type)) + geom_bar(stat='identity') + 
  geom_vline(xintercept=2015.5, linetype="dashed") +
  geom_text(x=2015.7, y=-38, label="President Miller's First Term", angle=90, family="Avenir", face="italic", size=textsz*0.28) +
  scale_x_continuous(breaks=c(2009:2022), labels=c("'09", "'10", "'11", "'12", "'13", "'14", "'15", "'16", "'17", "'18", "'19", "'20", "'21", "'22")) +
  labs(x="Year", y="Change in the number of academic programs", fill="") + theme_minimal() + 
  guides(fill=guide_legend(nrow=2, byrow=T)) +
  theme(axis.text.x = element_text( vjust=1),
        text=element_text(family="Avenir", size=textsz),
        axis.title = element_text(face="bold", size=textsz*1.2),
        axis.title.x = element_text(hjust=0.5, vjust=-4),
        axis.title.y = element_text(hjust=1.5, vjust=1.4),
        plot.title = element_text(face="bold"),
        legend.position = "bottom",
        legend.direction = "vertical",
        legend.justification="right",
        legend.box.margin = margin(-50, 3, 0, 0),
        legend.text = element_text(size=textsz*0.95),
        legend.spacing.y = unit(20, "pt")
        ) + 
  scale_fill_manual(values=c("darkgray", hamline_red))

```

# Finances

Lastly, I explored Hamline's finances since 2012.

Despite the reliable frustration in response to Hamline's annual tuition increase announcement, nearly every university raises its tuition year after year. Still, the university's financial stability has been a major concern since before Miller's presidency, and with a sizable budget deficit looming over campus, this Miller's final year looks no different.

When I interviewed President Miller on Nov. 30, 2023, she confirmed that the annual tuition change is part of Hamline being a "tuition-funded University" affected by inflation and declining enrollment and that she had prioritized growing the school's endowment throughout her term.

The financial reports of private, non-profit universities like Hamline are public^[Though there is often a lengthy (multi-year) delay between a year's tax season and public access to the 990 form.]. This form includes an itemized list of major expenses which are totaled into a single "Total Expenses" field. When that number is divided by the university's reported enrollment, we arrive at an approximated *Expenses Per Student* which might reasonably be expected to correlate with what the university charges for tuition. In the MIAC at large, it does. At Hamline, despite declining enrollment numbers, the reported *Expenses Per Student* fell from more than \$40k to less than *\$25k* while tuition steadily climbed past \$40k. Where is all that money going?


## Reported Expenses Per Student vs Tuition 

```{r message=F, warning=F, fig.width=16, fig.height=8}
p1 = pc %>% select(School, TotalExpenses, Year) %>% 
  group_by(School, Year) %>% filter(Year < 2021) %>% summarize(School=School[1], Year=Year[1], TotalExpenses=TotalExpenses[1]) %>% 
  mutate(Pop = as.numeric(getPop(School, Year)), 
         ExpensePerStudent=TotalExpenses/Pop, 
         isHU = ifelse(School=="HU", "Hamline", "MIAC")) %>% 
  group_by(isHU, Year) %>% summarize(ExpensePerStudent = mean(ExpensePerStudent)) %>% left_join(tuits %>% filter(isHU=="Hamline")) %>%
  filter(isHU=="Hamline") %>%
  ggplot(aes(x=Year, y=ExpensePerStudent)) + scale_x_continuous(breaks=2012:2020) +
  geom_area(aes(y=amt), linetype="dashed", linewidth=4, fill="#9d2235") + 
  theme_minimal() + 
  geom_area(linewidth=4, fill="darkgray", alpha=0.8) +
  scale_y_continuous(labels = scales::label_dollar(), limits=c(0, 50000)) +
  geom_text(x=2016, y=10000, label="Total university expenses per student", family="Avenir", size=textsz*0.25) +
  geom_text(x=2018, y=35000, label="Hamline university in-state tuition", col="white", family="Avenir", size=textsz*0.25) + 
  labs(y="Cost of tuition and cost of university expenses (USD)\n", x="\nYear", title="Tuition vs. university expenses per student at Hamline University") + 
  theme(plot.title = element_text(hjust=0.5, face="bold"),
        axis.title = element_text(face="bold"),
        text = element_text(family="Avenir", size=textsz*0.6))

p2 = pc %>% select(School, TotalExpenses, Year) %>% 
  group_by(School, Year) %>% filter(Year < 2021) %>% summarize(School=School[1], Year=Year[1], TotalExpenses=TotalExpenses[1]) %>% 
  mutate(Pop = as.numeric(getPop(School, Year)), 
         ExpensePerStudent=TotalExpenses/Pop, 
         isHU = ifelse(School=="HU", "Hamline", "MIAC")) %>% 
  group_by(isHU, Year) %>% summarize(ExpensePerStudent = mean(ExpensePerStudent)) %>% left_join(tuits %>% mutate(isHU!="Hamline")) %>%
  group_by(isHU, Year) %>% summarize(ExpensePerStudent = mean(ExpensePerStudent), amt=mean(amt)) %>%
  filter(isHU!="Hamline") %>%
  ggplot(aes(x=Year, y=ExpensePerStudent)) + scale_x_continuous(breaks=2012:2020) +
  theme_minimal() + 
  geom_area(linewidth=4, fill="darkgray", alpha=0.8) +
  geom_area(aes(y=amt), linetype="dashed", linewidth=4, fill="#0f7754") + 
  scale_y_continuous(labels = scales::label_dollar(), limits=c(0, 50000)) +
  geom_text(x=2014.6, y=41000, label="Mean total university expenses per student", family="Avenir", size=textsz*0.25) +
  geom_text(x=2016, y=20000, label="MIAC mean in-state tuition", col="white", family="Avenir", size=textsz*0.25) + 
  labs(y="Cost of tuition and cost of university expenses (USD)\n", x="\nYear", title="Tuition vs. university expenses per student in the MIAC") + 
  theme(plot.title = element_text(hjust=0.5, face="bold"),
        axis.title = element_text(face="bold"),
        text = element_text(family="Avenir", size=textsz*0.6))


grid.arrange(p1, p2, ncol=2)
```

The MIAC schools vary significantly, and that in turn limits the meaning of any direct comparison of the dollar amount of administrative salaries at different schools. However, Form 990 also includes a report of *all compensation paid to university employees*. By instead comparing the portion of all university compensation that is paid to the university president, we can see that Hamline's presidential portion has grown sizably since the start of Miller's presidency, not only in excess of the MIAC average but in complete opposition to the average decrease seen during the COVID-19 pandemic.

## Change in the Presidential Portion of All Compensation, Hamline vs. Mean in the MIAC

```{r message=F, warning=F, fig.width=12, fig.height=9}
#pdf('PresPayChange.pdf', width=12, height=9)

pc %>% filter(Title %in% c("PRESIDENT", "President"), !(School %in% c("St. Mary", "St. Kate"))) %>% 
  mutate(CompRate = ReportableCompFromOrg/(OfficerPay + OtherSalaries)) %>% 
  group_by(isHU, Year) %>% summarize(CompRate = mean(CompRate)) %>% arrange(Year) %>%
  ggplot(aes(x=Year, y=CompRate)) + geom_line(aes(color=isHU), linewidth=5) + pct +
  theme_minimal() + labs(col="", y = "Presidential portion of all university compensation") +
  geom_vline(xintercept=2015, linetype="dashed") +
  geom_text(aes(x=-900), x=2015.2, y=0.015, label="President Miller's First Term", angle=90, family="Avenir",
            size=textsz*0.28) +
  scale_x_continuous(breaks=c(2012:2021), 
                     labels=c("'12", "'13", "'14", "'15", "'16", "'17", "'18", "'19", "'20", "'21"), 
                     limits=c(2012, 2021)) +
  guides(col=guide_legend(nrow=2, byrow=T), label = F, text = F, col=F) +
  theme(axis.text.x = element_text( vjust=1),
        text=element_text(family="Avenir", size=textsz),
        axis.title = element_text(face="bold", size=textsz*1.2),
        axis.title.x = element_text(hjust=0.5, vjust=-4),
        axis.title.y = element_text(hjust=1, vjust=1.4),
        plot.title = element_text(face="bold"),
        legend.position = "bottom",
        legend.direction = "vertical",
        legend.justification="right",
        legend.box.margin = margin(-50, 3, 0, 0),
        legend.text = element_text(size=textsz*0.95),
        legend.spacing.y = unit(20, "pt")
        ) + 
  scale_color_manual(values=c(hamline_red, miac_green))

#dev.off()

```


# Notes
